package com.quiz.bis.domain.model;


import lombok.Data;

import java.util.List;

/**
 * 预处理后的文本信息
 */
@Data
public class ProcessedText {
    // 清理后的纯文本
    private String cleanText;
    // 分词结果
    private List<String> words;
    // 提取的公式列表
    private List<String> formulas;
    // 提取的图片ID列表
    private List<Long> imageIds;
    // 提取的表格HTML列表
    private List<String> tables;

    public ProcessedText(String cleanText, List<String> words,
                         List<String> formulas, List<Long> imageIds,
                         List<String> tables) {
        this.cleanText = cleanText;
        this.words = words;
        this.formulas = formulas;
        this.imageIds = imageIds;
        this.tables = tables;
    }
}
